mtcars %>% lm(mpg ~ wt + cyl, .)
# Sample mtcars %>% dplyr::sample_n(10) %>% lm(mpg ~ wt + cyl, .)
# Profile profvis::profvis(mtcars %>% lm(mpg ~ wt + cyl, .))
# Scale Up cloudml::cloudml_train("train.R")
# Scale Out mtcars_tbl %>% sparklyr::ml_linear_regression(mpg ~ wt + cyl)
Attribution: Javier Luraschi’s talk slides from SDSS 2019
source: Zaharia et al. (2016). Apache Spark: A Unified Engine For Big Data Processing
(and sparklyr)
sparklyr